// Copyright (c) 2012 The Chromium Authors. All rights reserved.
// Use of this source code is governed by a BSD-style license that can be
// found in the LICENSE file.

#include "base/strings/string_split.h"

#include <stddef.h>

#include "base/macros.h"
#include "base/strings/string_util.h"
#include "base/strings/utf_string_conversions.h"
#include "testing/gmock/include/gmock/gmock.h"
#include "testing/gtest/include/gtest/gtest.h"

using ::testing::ElementsAre;

namespace base {

class SplitStringIntoKeyValuePairsTest : public testing::Test {
protected:
    base::StringPairs kv_pairs;
};

TEST_F(SplitStringIntoKeyValuePairsTest, EmptyString)
{
    EXPECT_TRUE(SplitStringIntoKeyValuePairs(std::string(),
        ':', // Key-value delimiter
        ',', // Key-value pair delimiter
        &kv_pairs));
    EXPECT_TRUE(kv_pairs.empty());
}

TEST_F(SplitStringIntoKeyValuePairsTest, MissingKeyValueDelimiter)
{
    EXPECT_FALSE(SplitStringIntoKeyValuePairs("key1,key2:value2",
        ':', // Key-value delimiter
        ',', // Key-value pair delimiter
        &kv_pairs));
    ASSERT_EQ(2U, kv_pairs.size());
    EXPECT_TRUE(kv_pairs[0].first.empty());
    EXPECT_TRUE(kv_pairs[0].second.empty());
    EXPECT_EQ("key2", kv_pairs[1].first);
    EXPECT_EQ("value2", kv_pairs[1].second);
}

TEST_F(SplitStringIntoKeyValuePairsTest, EmptyKeyWithKeyValueDelimiter)
{
    EXPECT_TRUE(SplitStringIntoKeyValuePairs(":value1,key2:value2",
        ':', // Key-value delimiter
        ',', // Key-value pair delimiter
        &kv_pairs));
    ASSERT_EQ(2U, kv_pairs.size());
    EXPECT_TRUE(kv_pairs[0].first.empty());
    EXPECT_EQ("value1", kv_pairs[0].second);
    EXPECT_EQ("key2", kv_pairs[1].first);
    EXPECT_EQ("value2", kv_pairs[1].second);
}

TEST_F(SplitStringIntoKeyValuePairsTest, TrailingAndLeadingPairDelimiter)
{
    EXPECT_TRUE(SplitStringIntoKeyValuePairs(",key1:value1,key2:value2,",
        ':', // Key-value delimiter
        ',', // Key-value pair delimiter
        &kv_pairs));
    ASSERT_EQ(2U, kv_pairs.size());
    EXPECT_EQ("key1", kv_pairs[0].first);
    EXPECT_EQ("value1", kv_pairs[0].second);
    EXPECT_EQ("key2", kv_pairs[1].first);
    EXPECT_EQ("value2", kv_pairs[1].second);
}

TEST_F(SplitStringIntoKeyValuePairsTest, EmptyPair)
{
    EXPECT_TRUE(SplitStringIntoKeyValuePairs("key1:value1,,key3:value3",
        ':', // Key-value delimiter
        ',', // Key-value pair delimiter
        &kv_pairs));
    ASSERT_EQ(2U, kv_pairs.size());
    EXPECT_EQ("key1", kv_pairs[0].first);
    EXPECT_EQ("value1", kv_pairs[0].second);
    EXPECT_EQ("key3", kv_pairs[1].first);
    EXPECT_EQ("value3", kv_pairs[1].second);
}

TEST_F(SplitStringIntoKeyValuePairsTest, EmptyValue)
{
    EXPECT_FALSE(SplitStringIntoKeyValuePairs("key1:,key2:value2",
        ':', // Key-value delimiter
        ',', // Key-value pair delimiter
        &kv_pairs));
    ASSERT_EQ(2U, kv_pairs.size());
    EXPECT_EQ("key1", kv_pairs[0].first);
    EXPECT_EQ("", kv_pairs[0].second);
    EXPECT_EQ("key2", kv_pairs[1].first);
    EXPECT_EQ("value2", kv_pairs[1].second);
}

TEST_F(SplitStringIntoKeyValuePairsTest, UntrimmedWhitespace)
{
    EXPECT_TRUE(SplitStringIntoKeyValuePairs("key1 : value1",
        ':', // Key-value delimiter
        ',', // Key-value pair delimiter
        &kv_pairs));
    ASSERT_EQ(1U, kv_pairs.size());
    EXPECT_EQ("key1 ", kv_pairs[0].first);
    EXPECT_EQ(" value1", kv_pairs[0].second);
}

TEST_F(SplitStringIntoKeyValuePairsTest, TrimmedWhitespace)
{
    EXPECT_TRUE(SplitStringIntoKeyValuePairs("key1:value1 , key2:value2",
        ':', // Key-value delimiter
        ',', // Key-value pair delimiter
        &kv_pairs));
    ASSERT_EQ(2U, kv_pairs.size());
    EXPECT_EQ("key1", kv_pairs[0].first);
    EXPECT_EQ("value1", kv_pairs[0].second);
    EXPECT_EQ("key2", kv_pairs[1].first);
    EXPECT_EQ("value2", kv_pairs[1].second);
}

TEST_F(SplitStringIntoKeyValuePairsTest, MultipleKeyValueDelimiters)
{
    EXPECT_TRUE(SplitStringIntoKeyValuePairs("key1:::value1,key2:value2",
        ':', // Key-value delimiter
        ',', // Key-value pair delimiter
        &kv_pairs));
    ASSERT_EQ(2U, kv_pairs.size());
    EXPECT_EQ("key1", kv_pairs[0].first);
    EXPECT_EQ("value1", kv_pairs[0].second);
    EXPECT_EQ("key2", kv_pairs[1].first);
    EXPECT_EQ("value2", kv_pairs[1].second);
}

TEST_F(SplitStringIntoKeyValuePairsTest, OnlySplitAtGivenSeparator)
{
    std::string a("a ?!@#$%^&*()_+:/{}\\\t\nb");
    EXPECT_TRUE(SplitStringIntoKeyValuePairs(a + "X" + a + "Y" + a + "X" + a,
        'X', // Key-value delimiter
        'Y', // Key-value pair delimiter
        &kv_pairs));
    ASSERT_EQ(2U, kv_pairs.size());
    EXPECT_EQ(a, kv_pairs[0].first);
    EXPECT_EQ(a, kv_pairs[0].second);
    EXPECT_EQ(a, kv_pairs[1].first);
    EXPECT_EQ(a, kv_pairs[1].second);
}

TEST_F(SplitStringIntoKeyValuePairsTest, DelimiterInValue)
{
    EXPECT_TRUE(SplitStringIntoKeyValuePairs("key1:va:ue1,key2:value2",
        ':', // Key-value delimiter
        ',', // Key-value pair delimiter
        &kv_pairs));
    ASSERT_EQ(2U, kv_pairs.size());
    EXPECT_EQ("key1", kv_pairs[0].first);
    EXPECT_EQ("va:ue1", kv_pairs[0].second);
    EXPECT_EQ("key2", kv_pairs[1].first);
    EXPECT_EQ("value2", kv_pairs[1].second);
}

TEST(SplitStringUsingSubstrTest, EmptyString)
{
    std::vector<std::string> results;
    SplitStringUsingSubstr(std::string(), "DELIMITER", &results);
    ASSERT_EQ(1u, results.size());
    EXPECT_THAT(results, ElementsAre(""));
}

TEST(StringUtilTest, SplitString_Basics)
{
    std::vector<std::string> r;

    r = SplitString(std::string(), ",:;", KEEP_WHITESPACE, SPLIT_WANT_ALL);
    EXPECT_TRUE(r.empty());

    // Empty separator list
    r = SplitString("hello, world", "", KEEP_WHITESPACE, SPLIT_WANT_ALL);
    ASSERT_EQ(1u, r.size());
    EXPECT_EQ("hello, world", r[0]);

    // Should split on any of the separators.
    r = SplitString("::,,;;", ",:;", KEEP_WHITESPACE, SPLIT_WANT_ALL);
    ASSERT_EQ(7u, r.size());
    for (auto str : r)
        ASSERT_TRUE(str.empty());

    r = SplitString("red, green; blue:", ",:;", TRIM_WHITESPACE,
        SPLIT_WANT_NONEMPTY);
    ASSERT_EQ(3u, r.size());
    EXPECT_EQ("red", r[0]);
    EXPECT_EQ("green", r[1]);
    EXPECT_EQ("blue", r[2]);

    // Want to split a string along whitespace sequences.
    r = SplitString("  red green   \tblue\n", " \t\n", TRIM_WHITESPACE,
        SPLIT_WANT_NONEMPTY);
    ASSERT_EQ(3u, r.size());
    EXPECT_EQ("red", r[0]);
    EXPECT_EQ("green", r[1]);
    EXPECT_EQ("blue", r[2]);

    // Weird case of splitting on spaces but not trimming.
    r = SplitString(" red ", " ", TRIM_WHITESPACE, SPLIT_WANT_ALL);
    ASSERT_EQ(3u, r.size());
    EXPECT_EQ("", r[0]); // Before the first space.
    EXPECT_EQ("red", r[1]);
    EXPECT_EQ("", r[2]); // After the last space.
}

TEST(StringUtilTest, SplitString_WhitespaceAndResultType)
{
    std::vector<std::string> r;

    // Empty input handling.
    r = SplitString(std::string(), ",", KEEP_WHITESPACE, SPLIT_WANT_ALL);
    EXPECT_TRUE(r.empty());
    r = SplitString(std::string(), ",", KEEP_WHITESPACE, SPLIT_WANT_NONEMPTY);
    EXPECT_TRUE(r.empty());

    // Input string is space and we're trimming.
    r = SplitString(" ", ",", TRIM_WHITESPACE, SPLIT_WANT_ALL);
    ASSERT_EQ(1u, r.size());
    EXPECT_EQ("", r[0]);
    r = SplitString(" ", ",", TRIM_WHITESPACE, SPLIT_WANT_NONEMPTY);
    EXPECT_TRUE(r.empty());

    // Test all 4 combinations of flags on ", ,".
    r = SplitString(", ,", ",", KEEP_WHITESPACE, SPLIT_WANT_ALL);
    ASSERT_EQ(3u, r.size());
    EXPECT_EQ("", r[0]);
    EXPECT_EQ(" ", r[1]);
    EXPECT_EQ("", r[2]);
    r = SplitString(", ,", ",", KEEP_WHITESPACE, SPLIT_WANT_NONEMPTY);
    ASSERT_EQ(1u, r.size());
    ASSERT_EQ(" ", r[0]);
    r = SplitString(", ,", ",", TRIM_WHITESPACE, SPLIT_WANT_ALL);
    ASSERT_EQ(3u, r.size());
    EXPECT_EQ("", r[0]);
    EXPECT_EQ("", r[1]);
    EXPECT_EQ("", r[2]);
    r = SplitString(", ,", ",", TRIM_WHITESPACE, SPLIT_WANT_NONEMPTY);
    ASSERT_TRUE(r.empty());
}

TEST(SplitStringUsingSubstrTest, StringWithNoDelimiter)
{
    std::vector<std::string> results;
    SplitStringUsingSubstr("alongwordwithnodelimiter", "DELIMITER", &results);
    ASSERT_EQ(1u, results.size());
    EXPECT_THAT(results, ElementsAre("alongwordwithnodelimiter"));
}

TEST(SplitStringUsingSubstrTest, LeadingDelimitersSkipped)
{
    std::vector<std::string> results;
    SplitStringUsingSubstr(
        "DELIMITERDELIMITERDELIMITERoneDELIMITERtwoDELIMITERthree",
        "DELIMITER",
        &results);
    ASSERT_EQ(6u, results.size());
    EXPECT_THAT(results, ElementsAre("", "", "", "one", "two", "three"));
}

TEST(SplitStringUsingSubstrTest, ConsecutiveDelimitersSkipped)
{
    std::vector<std::string> results;
    SplitStringUsingSubstr(
        "unoDELIMITERDELIMITERDELIMITERdosDELIMITERtresDELIMITERDELIMITERcuatro",
        "DELIMITER",
        &results);
    ASSERT_EQ(7u, results.size());
    EXPECT_THAT(results, ElementsAre("uno", "", "", "dos", "tres", "", "cuatro"));
}

TEST(SplitStringUsingSubstrTest, TrailingDelimitersSkipped)
{
    std::vector<std::string> results;
    SplitStringUsingSubstr(
        "unDELIMITERdeuxDELIMITERtroisDELIMITERquatreDELIMITERDELIMITERDELIMITER",
        "DELIMITER",
        &results);
    ASSERT_EQ(7u, results.size());
    EXPECT_THAT(
        results, ElementsAre("un", "deux", "trois", "quatre", "", "", ""));
}

TEST(SplitStringPieceUsingSubstrTest, StringWithNoDelimiter)
{
    std::vector<base::StringPiece> results = SplitStringPieceUsingSubstr("alongwordwithnodelimiter", "DELIMITER",
        base::TRIM_WHITESPACE, base::SPLIT_WANT_ALL);
    ASSERT_EQ(1u, results.size());
    EXPECT_THAT(results, ElementsAre("alongwordwithnodelimiter"));
}

TEST(SplitStringPieceUsingSubstrTest, LeadingDelimitersSkipped)
{
    std::vector<base::StringPiece> results = SplitStringPieceUsingSubstr(
        "DELIMITERDELIMITERDELIMITERoneDELIMITERtwoDELIMITERthree", "DELIMITER",
        base::TRIM_WHITESPACE, base::SPLIT_WANT_ALL);
    ASSERT_EQ(6u, results.size());
    EXPECT_THAT(results, ElementsAre("", "", "", "one", "two", "three"));
}

TEST(SplitStringPieceUsingSubstrTest, ConsecutiveDelimitersSkipped)
{
    std::vector<base::StringPiece> results = SplitStringPieceUsingSubstr(
        "unoDELIMITERDELIMITERDELIMITERdosDELIMITERtresDELIMITERDELIMITERcuatro",
        "DELIMITER", base::TRIM_WHITESPACE, base::SPLIT_WANT_ALL);
    ASSERT_EQ(7u, results.size());
    EXPECT_THAT(results, ElementsAre("uno", "", "", "dos", "tres", "", "cuatro"));
}

TEST(SplitStringPieceUsingSubstrTest, TrailingDelimitersSkipped)
{
    std::vector<base::StringPiece> results = SplitStringPieceUsingSubstr(
        "unDELIMITERdeuxDELIMITERtroisDELIMITERquatreDELIMITERDELIMITERDELIMITER",
        "DELIMITER", base::TRIM_WHITESPACE, base::SPLIT_WANT_ALL);
    ASSERT_EQ(7u, results.size());
    EXPECT_THAT(results,
        ElementsAre("un", "deux", "trois", "quatre", "", "", ""));
}

TEST(SplitStringPieceUsingSubstrTest, KeepWhitespace)
{
    std::vector<base::StringPiece> results = SplitStringPieceUsingSubstr(
        "un DELIMITERdeux\tDELIMITERtrois\nDELIMITERquatre", "DELIMITER",
        base::KEEP_WHITESPACE, base::SPLIT_WANT_ALL);
    ASSERT_EQ(4u, results.size());
    EXPECT_THAT(results, ElementsAre("un ", "deux\t", "trois\n", "quatre"));
}

TEST(SplitStringPieceUsingSubstrTest, TrimWhitespace)
{
    std::vector<base::StringPiece> results = SplitStringPieceUsingSubstr(
        "un DELIMITERdeux\tDELIMITERtrois\nDELIMITERquatre", "DELIMITER",
        base::TRIM_WHITESPACE, base::SPLIT_WANT_ALL);
    ASSERT_EQ(4u, results.size());
    EXPECT_THAT(results, ElementsAre("un", "deux", "trois", "quatre"));
}

TEST(SplitStringPieceUsingSubstrTest, SplitWantAll)
{
    std::vector<base::StringPiece> results = SplitStringPieceUsingSubstr(
        "unDELIMITERdeuxDELIMITERtroisDELIMITERDELIMITER", "DELIMITER",
        base::TRIM_WHITESPACE, base::SPLIT_WANT_ALL);
    ASSERT_EQ(5u, results.size());
    EXPECT_THAT(results, ElementsAre("un", "deux", "trois", "", ""));
}

TEST(SplitStringPieceUsingSubstrTest, SplitWantNonEmpty)
{
    std::vector<base::StringPiece> results = SplitStringPieceUsingSubstr(
        "unDELIMITERdeuxDELIMITERtroisDELIMITERDELIMITER", "DELIMITER",
        base::TRIM_WHITESPACE, base::SPLIT_WANT_NONEMPTY);
    ASSERT_EQ(3u, results.size());
    EXPECT_THAT(results, ElementsAre("un", "deux", "trois"));
}

TEST(StringSplitTest, StringSplitKeepWhitespace)
{
    std::vector<std::string> r;

    r = SplitString("   ", "*", base::KEEP_WHITESPACE, base::SPLIT_WANT_ALL);
    ASSERT_EQ(1U, r.size());
    EXPECT_EQ(r[0], "   ");

    r = SplitString("\t  \ta\t ", "\t", base::KEEP_WHITESPACE,
        base::SPLIT_WANT_ALL);
    ASSERT_EQ(4U, r.size());
    EXPECT_EQ(r[0], "");
    EXPECT_EQ(r[1], "  ");
    EXPECT_EQ(r[2], "a");
    EXPECT_EQ(r[3], " ");

    r = SplitString("\ta\t\nb\tcc", "\n", base::KEEP_WHITESPACE,
        base::SPLIT_WANT_ALL);
    ASSERT_EQ(2U, r.size());
    EXPECT_EQ(r[0], "\ta\t");
    EXPECT_EQ(r[1], "b\tcc");
}

TEST(StringSplitTest, SplitStringAlongWhitespace)
{
    struct TestData {
        const char* input;
        const size_t expected_result_count;
        const char* output1;
        const char* output2;
    } data[] = {
        { "a", 1, "a", "" },
        { " ", 0, "", "" },
        { " a", 1, "a", "" },
        { " ab ", 1, "ab", "" },
        { " ab c", 2, "ab", "c" },
        { " ab c ", 2, "ab", "c" },
        { " ab cd", 2, "ab", "cd" },
        { " ab cd ", 2, "ab", "cd" },
        { " \ta\t", 1, "a", "" },
        { " b\ta\t", 2, "b", "a" },
        { " b\tat", 2, "b", "at" },
        { "b\tat", 2, "b", "at" },
        { "b\t at", 2, "b", "at" },
    };
    for (size_t i = 0; i < arraysize(data); ++i) {
        std::vector<std::string> results = base::SplitString(
            data[i].input, kWhitespaceASCII, base::KEEP_WHITESPACE,
            base::SPLIT_WANT_NONEMPTY);
        ASSERT_EQ(data[i].expected_result_count, results.size());
        if (data[i].expected_result_count > 0)
            ASSERT_EQ(data[i].output1, results[0]);
        if (data[i].expected_result_count > 1)
            ASSERT_EQ(data[i].output2, results[1]);
    }
}

} // namespace base
